N_ROWS = 3
N_COLS = 2
N_ROBOTS = 1
N_STACKS = 2
N_ITEMS = 1
ORDER_PROB = 0.1

LEARNING_RATE = 0.4
DISCOUNT_FACTOR = 0.9